# clear working environment
rm(list = ls())

#### load the required packages ####
library(tidyverse)
library(PanelMatch)
library(countrycode)

#### load the clean data ####
df <- read_rds("data/dem-transitions-replication-data.rds") %>%
  glimpse()

#### make df into a properly formatted dataframe for PanelMatch ####

# begin coercing df into m
# df needs to be a dataframe class
m <- as.data.frame(df)
# check to see if m is a dataframe
class(m)

# country needs to be an integer to use PanelMatch
m$country <- as.integer(m$country)

# year needs to be an integer to use PanelMatch
m$year <- as.integer(m$year)

# create placebo treatment variables
m <- m %>%
  group_by(country) %>%
  mutate(regime_lead_4 = dplyr::lead(v2x_regime, 4)) %>%
  mutate(regime_lead_6 = dplyr::lead(v2x_regime, 6)) %>%
  mutate(year_lead_4 = dplyr::lead(year, 4)) %>%
  mutate(year_lead_6 = dplyr::lead(year, 6)) %>%
  ungroup() %>%
  glimpse()

m$placebo <- as.numeric(ifelse(m$regime_lead_6 >= 2, 1, 0))

# all other variables, except categorical variables, need to be numeric
m$mid <- as.numeric(m$mid)
m$fatal <- as.numeric(m$fatal)
m$ln_cinc <- as.numeric(m$ln_cinc)
m$ln_pecpp <- as.numeric(m$ln_pecpp)
m$terr_dispute <- as.numeric(m$terr_dispute)
m$v2x_freexp_altinf <- as.numeric(m$v2x_freexp_altinf)
m$v2xlg_legcon <- as.numeric(m$v2xlg_legcon)
m$v2x_cspart <- as.numeric(m$v2x_cspart)
m$v2x_suffr <- as.numeric(m$v2x_suffr)
m$v2fsuffrage <- as.numeric(m$v2fsuffrage)
m$v2msuffrage <- as.numeric(m$v2msuffrage)

# make sure all of the rows are unique
m <- distinct(m, country, year, .keep_all = TRUE)

# df needs to be a dataframe class
m <- as.data.frame(m)
# check to see if m is a dataframe
class(m)

#### effect of democratic transitions on women's de facto suffrage ####
# create panel data
panel <- PanelData(panel.data = m,
                   unit.id = "country",
                   time.id = "year",
                   treatment = "placebo",
                   outcome = "v2fsuffrage")

# create matched sets
PMresults.fvote.att <- PanelMatch(panel.data = panel, lag = 5, refinement.method = "CBPS.weight",
                                  match.missing = TRUE, exact.match.variables = c("un_region"),
                                  covs.formula = ~ I(lag(v2fsuffrage, 1:5)) + I(lag(ln_cinc, 1:5)) + I(lag(ln_pecpp, 1:5)) + I(lag(terr_dispute, 1:5)),
                                  qoi = "att", lead = 1:5, forbid.treatment.reversal = FALSE,
                                  use.diagonal.variance.matrix = TRUE)

# estimate the ATT
PEresults.fvote.att <- PanelEstimate(panel.data = panel, 
                                     sets = PMresults.fvote.att,
                                     se.method = "unconditional", 
                                     confidence.level = .90)

#### effect of democratic transition on men's de facto suffrage ####
# create panel data
panel <- PanelData(panel.data = m,
                   unit.id = "country",
                   time.id = "year",
                   treatment = "placebo",
                   outcome = "v2msuffrage")

# create matched sets
PMresults.mvote.att <- PanelMatch(panel.data = panel, lag = 5, refinement.method = "CBPS.weight",
                                  match.missing = TRUE, exact.match.variables = c("un_region"),
                                  covs.formula = ~ I(lag(v2msuffrage, 1:5)) + I(lag(ln_cinc, 1:5)) + I(lag(ln_pecpp, 1:5)) + I(lag(terr_dispute, 1:5)),
                                  qoi = "att", lead = 1:5, forbid.treatment.reversal = FALSE,
                                  use.diagonal.variance.matrix = TRUE)
# estimate the ATT
PEresults.mvote.att <- PanelEstimate(panel.data = panel, 
                                     sets = PMresults.mvote.att,
                                     se.method = "unconditional", 
                                     confidence.level = .90)

#### create a plot of estimates ####
# assemble plotting data frame
gg <- data.frame(years = rep(c("t-5", "t-4", "t-3", "t-2", "t-1"), 2),
                 estimates = c(PEresults.fvote.att[["estimate"]], PEresults.mvote.att[["estimate"]]),
                 st_error = c(PEresults.fvote.att[["standard.error"]], PEresults.mvote.att[["standard.error"]]),
                 outcome = c(rep("Female Suffrage (de facto)", 5), rep("Male Suffrage (de facto)", 5))) %>%
  mutate(lo_ci = estimates - (1.645*st_error)) %>%
  mutate(hi_ci = estimates + (1.645*st_error)) %>% 
  mutate(significant = as.factor(ifelse(lo_ci > 0 | hi_ci < 0, 1, 0))) %>%
  glimpse()

# create Figure H.2 for the Appendix
ggplot(data = gg, aes(x = reorder(years, desc(years)), color = outcome, shape = outcome)) +
  geom_hline(aes(yintercept = 0), linetype = "dashed", linewidth = .25) +
  geom_pointrange(aes(y = estimates, ymin = lo_ci, ymax = hi_ci), size = .4, linewidth = .7, position = position_dodge(width = .3)) +
  scale_color_manual(values = c("black", "darkgray")) +
  ylim(-15, 20) +
  theme_minimal() +
  theme(legend.position = "bottom",
        axis.text.x = element_text(color = "black", size = 10),
        axis.title.y = element_text(size = 12),
        legend.title = element_text(size = 12)) +
  labs(y = "Effect of Democratic Transition",
       x = "Years Since Transition",
       color = "",
       shape = "")

# save plot
ggsave("figures/suffrage-placebo-att-plot.pdf", width = 5.5, height = 4, units = "in", bg = "white")
